# torch kernel benchmark
add_executable(torch_bench torch_bench.cu)
target_compile_features(torch_bench PRIVATE cuda_std_14)
target_include_directories(torch_bench PRIVATE ${TORCH_INCLUDE_DIRS} ${Python_INCLUDE_DIRS})
target_compile_options(torch_bench PRIVATE ${TORCH_CXX_FLAGS} ${gswitch_NVCC_FLAGS} ${OpenMP_CUDA_FLAGS})
target_link_libraries(torch_bench PRIVATE ${TORCH_LIBRARIES} OpenMP::OpenMP_CXX)
